python train.py \
    --train_datasets "mozilla-foundation/common_voice_11_0|mn|train+validation,google/fleurs|mn_mn|train+validation" \
    --eval_datasets "mozilla-foundation/common_voice_11_0|mn|test" \
    --whisper-size "small" \
    --language "mn,Mongolian" \
    --keep-chars " абвгдеёжзийклмноөпрстуүфхцчшъыьэюя.,?!" \
    --train-batch-size 32 \
    --eval-batch-size 16 \
    --max-steps 15000 \
    --num-workers 8 \
    --hf-username <your-huggingface-username> \
    --use-cached-dataset \
    --merge-audio-to-max \
    --version <version-number-to-be-added-to-resulting-model-card>
